import cache

class Corpus(object):
    def __init__(self, file, language):
        self.language = language
        self.corpus = []
        self.load_corpus(file)

    def load_corpus(self, file):
        f = open(file)
        sentences = f.readlines()
        for sentence in sentences:
            sentence = sentence.replace('\n', '').split(' ')
            self.corpus.append(sentence)        
        f.close()

